#!/usr/bin/env bash
# Copyright (c) 2023, NVIDIA CORPORATION. All rights reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

if [ -z "$1" ]; then
    echo "Provide model name as the first argument"
    exit 1
fi

# replace - and / to _ as Triton doesn't allow them in model names
# and are replaced in the server script
MODEL_NAME=${1//-/_}
MODEL_NAME=${MODEL_NAME//\//_}

curl http://localhost:8000/v2/models/${MODEL_NAME}/generate_stream \
    -H "Content-Type: application/json" \
    -sS \
    -w "\n" \
    -d '{
        "prompt": "San Francisco is a",
        "max_tokens": 128,
        "temperature": 0,
        "stream": true
    }'